package com.apex.spark.batch;

import com.apex.spark.SparkBaseSource;
import com.apex.spark.SparkEnvironment;
import org.apache.spark.sql.Dataset;
import org.apache.spark.sql.Row;

/**
 * 数据源定义
 */
public interface SparkBatchSource  extends SparkBaseSource {
    /**
     * 获取源端数据并发送到下游处理
     * @param environment 上下文执行环境
     * @return Dataset<Row>
     */
    Dataset<Row> getData(SparkEnvironment environment);
}
